\begin{figure}[h]
    \centering
    \begin{subfigure}{0.45\textwidth}
        \centering
        \includegraphics[width=\linewidth]{scatter-plot_OOD-accuracy_vs_observed-consistency_multiple-datasets.pdf}
        %\vspace{-0.1cm}
        \caption{Out-of-distribution accuracy vs.\\observed consistency}
        \label{subfig:error_consistency_12_datasets}
    \end{subfigure}
    \begin{subfigure}{0.45\textwidth}
        \centering
        \includegraphics[width=\linewidth]{scatter-plot_OOD-accuracy_vs_error-consistency_multiple-datasets.pdf}
        %\vspace{-0.1cm}
        \caption{Out-of-distribution accuracy vs.\\error consistency}
        \label{subfig:error_consistency_5_datasets}
    \end{subfigure}
    \label{fig:error_consistency_12_and_5_datasets}
    \vspace{-0.1cm}
    \caption{Observed consistency and error consistency between models and humans as a function of out-of-distribution (OOD) accuracy. Dotted lines indicate consistency expected by chance.}
\end{figure}